# export GLOO_SOCKET_IFNAME=enp23s0f3
# export TP_SOCKET_IFNAME=enp23s0f3
# export ASCEND_RT_VISIBLE_DEVICES=0,1,2,3
# export VLLM_USE_V1=1
# export VLLM_WORKER_MULTIPROC_METHOD=fork
# export VLLM_ENABLE_MC2=0
# export USING_LCCL_COM=0

# export OMNI_USE_QWEN=1

# python start_api_servers.py \
#         --num-servers 1 \
#         --model-path /data/model/QwQ-32B \
#         --master-ip 7.150.13.139 \
#         --tp 4 \
#         --master-port 60666 \
#         --served-model-name qwen \
#         --log-dir apiserverlog \
#         --extra-args "--enforce-eager " \
#         --base-api-port 8888


export GLOO_SOCKET_IFNAME=enp23s0f3
export TP_SOCKET_IFNAME=enp23s0f3
export ASCEND_RT_VISIBLE_DEVICES=0
export VLLM_USE_V1=1
export VLLM_WORKER_MULTIPROC_METHOD=fork
export VLLM_ENABLE_MC2=0
export USING_LCCL_COM=0

export OMNI_USE_QWEN=1

python start_api_servers.py \
        --num-servers 1 \
        --model-path /data/model/Qwen2.5-7B-Instruct \
        --master-ip 7.150.13.139 \
        --tp 1 \
        --master-port 60666 \
        --served-model-name qwen \
        --log-dir apiserverlog \
        --extra-args "--enforce-eager " \
        --base-api-port 8888
